@@ -0,0 +1,83 @@ |
||
1 |
+require 'csv' |
|
2 |
+ |
|
3 |
+module Agents |
|
4 |
+ class SentimentAgent < Agent |
|
5 |
+ class_attribute :anew |
|
6 |
+ |
|
7 |
+ cannot_be_scheduled! |
|
8 |
+ |
|
9 |
+ description <<-MD |
|
10 |
+ The SentimentAgent generates `good-bad` (psychological valence or happiness index), `active-passive` (arousal), |
|
11 |
+ and `strong-weak` (dominance) score. It will output a value between 1 and 9. |
|
12 |
+ |
|
13 |
+ Make sure the content this agent is analyzing have sufficient length to get respectable results. |
|
14 |
+ |
|
15 |
+ Provide a JSONPath in `content` field where content is residing and set `expected_receive_period_in_days` to the maximum number of days you would allow to be passed between events being received by this agent. |
|
16 |
+ MD |
|
17 |
+ |
|
18 |
+ event_description <<-MD |
|
19 |
+ Events look like: |
|
20 |
+ { |
|
21 |
+ :content => "The quick brown fox jumps over the lazy dog.", |
|
22 |
+ :valence => 6.196666666666666, |
|
23 |
+ :arousal => 4.993333333333333, |
|
24 |
+ :dominance => 5.63 |
|
25 |
+ } |
|
26 |
+ MD |
|
27 |
+ |
|
28 |
+ def default_options |
|
29 |
+ { |
|
30 |
+ :content => "$.message.text[*]", |
|
31 |
+ :expected_receive_period_in_days => 1 |
|
32 |
+ } |
|
33 |
+ end |
|
34 |
+ |
|
35 |
+ def working? |
|
36 |
+ last_receive_at && last_receive_at > options[:expected_receive_period_in_days].to_i.days.ago |
|
37 |
+ end |
|
38 |
+ |
|
39 |
+ def receive(incoming_events) |
|
40 |
+ anew = self.class.sentiment_hash |
|
41 |
+ incoming_events.each do |event| |
|
42 |
+ Utils.values_at(event.payload, options[:content]).each do |content| |
|
43 |
+ sent_values = sentiment_values anew, content |
|
44 |
+ create_event :payload => {:content => content, |
|
45 |
+ :valence => sent_values[0], |
|
46 |
+ :arousal => sent_values[1], |
|
47 |
+ :dominance => sent_values[2]} |
|
48 |
+ end |
|
49 |
+ end |
|
50 |
+ end |
|
51 |
+ |
|
52 |
+ def validate_options |
|
53 |
+ errors.add(:base, "content and expected_receive_period_in_days must be present") unless options[:content].present? && options[:expected_receive_period_in_days].present? |
|
54 |
+ end |
|
55 |
+ |
|
56 |
+ def self.sentiment_hash |
|
57 |
+ unless self.anew |
|
58 |
+ self.anew = {} |
|
59 |
+ CSV.foreach Rails.root.join('data/anew.csv') do |row| |
|
60 |
+ self.anew[row[0]] = row.values_at(2,4,6).map {|val| val.to_f} |
|
61 |
+ end |
|
62 |
+ end |
|
63 |
+ self.anew |
|
64 |
+ end |
|
65 |
+ |
|
66 |
+ def sentiment_values(anew,text) |
|
67 |
+ valence, arousal, dominance, freq = [0] * 4 |
|
68 |
+ text.downcase.strip.gsub(/[^a-z ]/,"").split.each do |word| |
|
69 |
+ if anew.has_key? word |
|
70 |
+ valence += anew[word][0] |
|
71 |
+ arousal += anew[word][1] |
|
72 |
+ dominance += anew[word][2] |
|
73 |
+ freq += 1 |
|
74 |
+ end |
|
75 |
+ end |
|
76 |
+ if valence != 0 |
|
77 |
+ [valence/freq, arousal/freq, dominance/freq] |
|
78 |
+ else |
|
79 |
+ ["Insufficient data for meaningful answer"] * 3 |
|
80 |
+ end |
|
81 |
+ end |
|
82 |
+ end |
|
83 |
+end |